# 数据读取
import pandas as pd

data = pd.read_csv('data/job.csv')
# 设置显示选项
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)
# 数据是否重复
# print(data.duplicated().value_counts())
# 缺失值处理
# print(data.fillna({"last_active": "未知", "address": "未知", "hiring_manager": "未知"}, inplace=True))
# print(data.isnull().any())
# print(data['City'].isnull() == True)
# print(data.isnull())
# 数据标准化
# for i in range(12, 30):
#     data['salary'] = data['salary'].str.replace('·' + str(i) + '薪', '')
# data['description'] = data['description'].str.replace('?', '')
# data.to_csv('data/processed_data.csv', index=False)
# print(data['job'] == '其它')
count = 0

count = data['job'].value_counts()['其它']

print("计数结果:", count)
count2 = data['category'].value_counts()['其它']
print("计数结果:", count2)